{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "'''\n",
    "阿里研究院\n",
    "阿里健康\n",
    "阿里巴巴商学院\n",
    "阿里数据\n",
    "\n",
    "腾讯金融科技\n",
    "腾讯研究院\n",
    "腾讯媒体研究院\n",
    "腾讯云启研究院\n",
    "酷鹅用户研究院\n",
    "'''\n",
    "公众号 = \"野生运营社区\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "fn = { \"output\" : { \"公众号_htm_snippets\": \"data_raw_src/公众号_htm_snippets_{公众号}.tsv\",\n",
    "                    \"公众号_df\": \"data_raw_src/公众号_df_{公众号}.tsv\",\n",
    "                    \"公众号_xlsx\": \"data_sets/公众号_url_{公众号}.xlsx\" } \\\n",
    "      }"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "from lxml.html import fromstring\n",
    "import time\n",
    "from random import random\n",
    "\n",
    "# when selenium main_content is used\n",
    "# Parses an HTML document from a string constant.  Returns the root nood\n",
    "# root = fromstring(df.loc[1,\"html_snippets\"]) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "from selenium import webdriver\n",
    "from selenium.webdriver.common.desired_capabilities import DesiredCapabilities\n",
    "\n",
    "#caps=dict()\n",
    "#caps[\"pageLoadStrategy\"] = \"none\"   # Do not wait for full page load\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')#解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') #指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') #谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') #隐藏滚动条, 应对些特殊页面\n",
    "#opts.add_argument('blink-settings=imagesEnabled=false') #不加载图片, 提升速度\n",
    "#opts.add_argument('--headless') #浏览器不提供可视化页面. linux下如果系统不支持可视化不加这条会启动失败\n",
    "\n",
    "opts.binary_location = r\"C:\\Program Files (x86)\\Google\\Chrome\\Application\\chrome.exe\" #\"H:\\_coding_\\Gitee\\InternetNewMedia\\CapstonePrj2016\\chromedriver.exe\"  \n",
    "\n",
    "# \"H:\\_coding_\\Gitee\\InternetNewMedia\\CapstonePrj2016\\chromedriver.exe\"  \n",
    "driver = webdriver.Chrome( options = opts) #desired_capabilities=caps,"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.get(\"https://mp.weixin.qq.com\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "payload =  {\"account\": \"1196148045@qq.com\", \"password\": \"mwj18933815383\"}\n",
    "# payload =  {\"account\": \"NFUHacks@163.com\", \"password\": \"NFU706947580\"}\n",
    "driver.find_element_by_xpath('//div[@class=\"login__type__container login__type__container__scan\"]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.find_element_by_xpath('//form[@class=\"login_form\"]//input[@name=\"account\"]').clear()\n",
    "driver.find_element_by_xpath('//form[@class=\"login_form\"]//input[@name=\"account\"]').send_keys(payload['account'])\n",
    "driver.find_element_by_xpath('//form[@class=\"login_form\"]//input[@name=\"password\"]').clear()\n",
    "driver.find_element_by_xpath('//form[@class=\"login_form\"]//input[@name=\"password\"]').send_keys(payload['password'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.find_element_by_xpath('//div[@class=\"login_btn_panel\"]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'展开'"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element = driver.find_element_by_xpath('//a[@id=\"m_open\"]')\n",
    "main_content = element.get_attribute('innerHTML')\n",
    "main_content\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.execute_script(\"window.scrollTo(0,document.body.scrollHeight)\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'https://mp.weixin.qq.com/cgi-bin/appmsg?begin=0&count=10&t=media/appmsg_list&type=10&action=list&token=136414360&lang=zh_CN'"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element = driver.find_element_by_xpath('//li[@title[contains(.,\"素材管理\")]]/a') \n",
    "# main_content = element.get_attribute('innerHTML')\n",
    "# main_content\n",
    "url_素材管理= element.get_attribute(\"href\")\n",
    "url_素材管理"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.get(url_素材管理)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//*[text()[contains(.,\"新建图文消息\")]]') \n",
    "main_content = element.get_attribute('innerHTML')\n",
    "main_content\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "['CDwindow-C22DA581FC49A1C7AD319096C8B24305', 'CDwindow-71CAE10DAF76E91B35437BA6F99AD65A']\n"
     ]
    }
   ],
   "source": [
    "print (driver.window_handles)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 新建图文消息开了另一分视窗，所以要切换 switch_to \n",
    "driver.switch_to.window(driver.window_handles[-1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "                超链接              \n"
     ]
    }
   ],
   "source": [
    "element = driver.find_element_by_xpath('//*[text()[contains(.,\"超链接\")]]') \n",
    "main_content = element.get_attribute('innerHTML')\n",
    "print(main_content)\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "选择其他公众号\n"
     ]
    }
   ],
   "source": [
    "# 点 选择其他公众号\n",
    "element = driver.find_element_by_xpath('//*[text()[contains(.,\"选择其他公众号\")]]') \n",
    "main_content = element.get_attribute('innerHTML')\n",
    "print(main_content)\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.find_element_by_xpath('//form//div[@class=\"inner_link_account_area\"]//input[@class=\"weui-desktop-form__input\"]').clear()\n",
    "driver.find_element_by_xpath('//form//div[@class=\"inner_link_account_area\"]//input[@class=\"weui-desktop-form__input\"]').send_keys(公众号)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<div class=\"weui-desktop-icon weui-desktop-icon__inputSearch weui-desktop-icon__small\"><!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <!----> <svg width=\"16\" height=\"16\" viewBox=\"0 0 16 16\" xmlns=\"http://www.w3.org/2000/svg\"><path d=\"M11.33 10.007l4.273 4.273a.502.502 0 0 1 .005.709l-.585.584a.499.499 0 0 1-.709-.004L10.046 11.3a6.278 6.278 0 1 1 1.284-1.294zm.012-3.729a5.063 5.063 0 1 0-10.127 0 5.063 5.063 0 0 0 10.127 0z\"></path></svg> <!----> <!----> <!----> <!----></div>\n"
     ]
    }
   ],
   "source": [
    "# 点放大镜搜\n",
    "element = driver.find_element_by_xpath('//button[@class=\"weui-desktop-icon-btn weui-desktop-search__btn\"]')\n",
    "main_content = element.get_attribute('innerHTML')\n",
    "print(main_content)\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<li class=\"inner_link_account_item\"><div class=\"weui-desktop-vm_primary\"><img src=\"http://mmbiz.qpic.cn/mmbiz_png/NicaNwCeMyEPGbwEH6gYYkvFBYYaWO51mutNuzf0OcycCuFBhIesQqhuOAgwPRKyK45ia88U4XroBibBVdF7Tmfdw/0?wx_fmt=png\" class=\"inner_link_account_avatar\"> <strong class=\"inner_link_account_nickname\">野生运营社区</strong> <i class=\"inner_link_account_wechat\">微信号：dugu9bubai</i></div> <div class=\"weui-desktop-vm_default inner_link_account_type\">订阅号</div></li><li class=\"inner_link_account_item\"><div class=\"weui-desktop-vm_primary\"><img src=\"http://mmbiz.qpic.cn/mmbiz_png/vCO8J2FI7ibOyTM0FpTXglnXJaMhvIVAAHZiaDY9suC48gl8q6iavIOdicMH0Sz6ia1ZPONPHcn3KBicx1Sy7Wck3D7Q/0?wx_fmt=png\" class=\"inner_link_account_avatar\"> <strong class=\"inner_link_account_nickname\">野生运营小圈子</strong> <i class=\"inner_link_account_wechat\">微信号：zsd-study</i></div> <div class=\"weui-desktop-vm_default inner_link_account_type\">订阅号</div></li><li class=\"inner_link_account_item\"><div class=\"weui-desktop-vm_primary\"><img src=\"http://mmbiz.qpic.cn/mmbiz_png/qmbg5Mtd7CPr34SxxMzqicicL15oibk296SyXwXk9BBUSmH7V0lVTr15icJsujRQWeXZoI5AIQYKfCg6ZH7UxSTXjw/0?wx_fmt=png\" class=\"inner_link_account_avatar\"> <strong class=\"inner_link_account_nickname\">野生运营后进生</strong> <i class=\"inner_link_account_wechat\">微信号：ZT_anita</i></div> <div class=\"weui-desktop-vm_default inner_link_account_type\">订阅号</div></li><li class=\"inner_link_account_item\"><div class=\"weui-desktop-vm_primary\"><img src=\"http://mmbiz.qpic.cn/mmbiz_png/a2Jnxwt4GjfuRI791RVhnicsaAdtwmia5PeTk1micIhSvKSOG6VvJ9KbaDFGPiagQEAr7s0W8jcBsYvQ4SZxVEwI9Q/0?wx_fmt=png\" class=\"inner_link_account_avatar\"> <strong class=\"inner_link_account_nickname\">野生运营进化论</strong> <i class=\"inner_link_account_wechat\">微信号：sunweiox</i></div> <div class=\"weui-desktop-vm_default inner_link_account_type\">订阅号</div></li><li class=\"inner_link_account_item\"><div class=\"weui-desktop-vm_primary\"><img src=\"http://mmbiz.qpic.cn/mmbiz_png/gfVw1Ev6nLvaFPbPazC9NTzLr6pot7p18wiaMHLialvuGcFVwpY3Gf9vojs2XYfVTo4WV5NZalMcdsjOsVn6vZuA/0?wx_fmt=png\" class=\"inner_link_account_avatar\"> <strong class=\"inner_link_account_nickname\">许大姐野生河鲜销售部</strong> <i class=\"inner_link_account_wechat\">微信号：未设置</i></div> <div class=\"weui-desktop-vm_default inner_link_account_type\">服务号</div></li>\n"
     ]
    }
   ],
   "source": [
    "element = driver.find_element_by_xpath('//ul[@class=\"inner_link_account_list\"]')\n",
    "main_content = element.get_attribute('innerHTML')\n",
    "print(main_content)\n",
    "公众号SERP = main_content\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 解析\n",
    "root = fromstring(公众号SERP) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "主 = root.xpath('//li[@class=\"inner_link_account_item\"]')\n",
    "\n",
    "account_list = []\n",
    "for e in 主:\n",
    "    account_nickname = e.xpath('./div/strong[@class=\"inner_link_account_nickname\"]')[0].text\n",
    "    account_wechat = e.xpath('./div/i[@class=\"inner_link_account_wechat\"]')[0].text\n",
    "    account_img = e.xpath('./div/img/@src')[0]\n",
    "    account = {\"nickname\": account_nickname, \"wechat\": account_wechat, \"img\": account_img,}\n",
    "    account_list.append(account)\n",
    "\n",
    "df_account = pd.DataFrame(account_list)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>img</th>\n",
       "      <th>nickname</th>\n",
       "      <th>wechat</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>http://mmbiz.qpic.cn/mmbiz_png/NicaNwCeMyEPGbw...</td>\n",
       "      <td>野生运营社区</td>\n",
       "      <td>微信号：dugu9bubai</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>http://mmbiz.qpic.cn/mmbiz_png/vCO8J2FI7ibOyTM...</td>\n",
       "      <td>野生运营小圈子</td>\n",
       "      <td>微信号：zsd-study</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>http://mmbiz.qpic.cn/mmbiz_png/qmbg5Mtd7CPr34S...</td>\n",
       "      <td>野生运营后进生</td>\n",
       "      <td>微信号：ZT_anita</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>http://mmbiz.qpic.cn/mmbiz_png/a2Jnxwt4GjfuRI7...</td>\n",
       "      <td>野生运营进化论</td>\n",
       "      <td>微信号：sunweiox</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>http://mmbiz.qpic.cn/mmbiz_png/gfVw1Ev6nLvaFPb...</td>\n",
       "      <td>许大姐野生河鲜销售部</td>\n",
       "      <td>微信号：未设置</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 img    nickname  \\\n",
       "0  http://mmbiz.qpic.cn/mmbiz_png/NicaNwCeMyEPGbw...      野生运营社区   \n",
       "1  http://mmbiz.qpic.cn/mmbiz_png/vCO8J2FI7ibOyTM...     野生运营小圈子   \n",
       "2  http://mmbiz.qpic.cn/mmbiz_png/qmbg5Mtd7CPr34S...     野生运营后进生   \n",
       "3  http://mmbiz.qpic.cn/mmbiz_png/a2Jnxwt4GjfuRI7...     野生运营进化论   \n",
       "4  http://mmbiz.qpic.cn/mmbiz_png/gfVw1Ev6nLvaFPb...  许大姐野生河鲜销售部   \n",
       "\n",
       "           wechat  \n",
       "0  微信号：dugu9bubai  \n",
       "1   微信号：zsd-study  \n",
       "2    微信号：ZT_anita  \n",
       "3    微信号：sunweiox  \n",
       "4         微信号：未设置  "
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_account"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<div class=\"weui-desktop-vm_primary\"><img src=\"http://mmbiz.qpic.cn/mmbiz_png/NicaNwCeMyEPGbwEH6gYYkvFBYYaWO51mutNuzf0OcycCuFBhIesQqhuOAgwPRKyK45ia88U4XroBibBVdF7Tmfdw/0?wx_fmt=png\" class=\"inner_link_account_avatar\"> <strong class=\"inner_link_account_nickname\">野生运营社区</strong> <i class=\"inner_link_account_wechat\">微信号：dugu9bubai</i></div> <div class=\"weui-desktop-vm_default inner_link_account_type\">订阅号</div>\n"
     ]
    }
   ],
   "source": [
    "element = driver.find_element_by_xpath('//ul[@class=\"inner_link_account_list\"]/li')\n",
    "main_content = element.get_attribute('innerHTML')\n",
    "print(main_content)\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'\\n跳转_input = driver.find_element_by_xpath(\\'//span[@class=\"weui-desktop-pagination__form\"]/input\\')\\n跳转_a = driver.find_element_by_xpath(\\'//span[@class=\"weui-desktop-pagination__form\"]/a\\')\\n跳转_input.clear()\\n跳转_input.send_keys(2)\\n跳转_a.click()\\n'"
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 跳转testing\n",
    "'''\n",
    "跳转_input = driver.find_element_by_xpath('//span[@class=\"weui-desktop-pagination__form\"]/input')\n",
    "跳转_a = driver.find_element_by_xpath('//span[@class=\"weui-desktop-pagination__form\"]/a')\n",
    "跳转_input.clear()\n",
    "跳转_input.send_keys(2)\n",
    "跳转_a.click()\n",
    "'''"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1, 35]\n",
      "False\n"
     ]
    }
   ],
   "source": [
    "# 跳转上限\n",
    "l_e = driver.find_elements_by_xpath('//label[@class=\"weui-desktop-pagination__num\"]')\n",
    "l_e_int  = [int(x.text) for x in l_e] \n",
    "print (l_e_int)\n",
    "print (l_e_int[0]==l_e_int[-1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35]\n"
     ]
    }
   ],
   "source": [
    "pages = list(range(l_e_int[0],l_e_int[-1]+1 ))\n",
    "#print(pages[0:2])\n",
    "pages = list(range(1,l_e_int[-1]+1 ))\n",
    "print(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [],
   "source": [
    "# global varialbes \n",
    "html_raw = dict()\n",
    "main_content =\"\"\n",
    "element = None"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [],
   "source": [
    "def process_pages (pages):\n",
    "    for p in pages:\n",
    "        print (p,end='\\t')\n",
    "\n",
    "        跳转_input = driver.find_element_by_xpath('//span[@class=\"weui-desktop-pagination__form\"]/input')\n",
    "        跳转_a = driver.find_element_by_xpath('//span[@class=\"weui-desktop-pagination__form\"]/a')\n",
    "        跳转_input.clear()\n",
    "        跳转_input.send_keys(p)\n",
    "        跳转_a.click()\n",
    "\n",
    "        time.sleep(45+120*random())\n",
    "\n",
    "        element = driver.find_element_by_xpath('//div[@class=\"inner_link_article_list\"]')\n",
    "        main_content = element.get_attribute('innerHTML')\n",
    "        #print(main_content)\n",
    "        html_raw[p] = main_content"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\t2\t3\t4\t5\t6\t7\t8\t9\t10\t11\t12\t13\t14\t15\t16\t17\t18\t19\t20\t21\t22\t23\t24\t25\t26\t27\t28\t29\t30\t31\t32\t33\t34\t35\t"
     ]
    }
   ],
   "source": [
    "process_pages(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>html_snippets</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>&lt;div&gt;&lt;label class=\"inner_link_article_item\"&gt;&lt;s...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                        html_snippets\n",
       "1   <div><label class=\"inner_link_article_item\"><s...\n",
       "2   <div><label class=\"inner_link_article_item\"><s...\n",
       "3   <div><label class=\"inner_link_article_item\"><s...\n",
       "4   <div><label class=\"inner_link_article_item\"><s...\n",
       "5   <div><label class=\"inner_link_article_item\"><s...\n",
       "6   <div><label class=\"inner_link_article_item\"><s...\n",
       "7   <div><label class=\"inner_link_article_item\"><s...\n",
       "8   <div><label class=\"inner_link_article_item\"><s...\n",
       "9   <div><label class=\"inner_link_article_item\"><s...\n",
       "10  <div><label class=\"inner_link_article_item\"><s...\n",
       "11  <div><label class=\"inner_link_article_item\"><s...\n",
       "12  <div><label class=\"inner_link_article_item\"><s...\n",
       "13  <div><label class=\"inner_link_article_item\"><s...\n",
       "14  <div><label class=\"inner_link_article_item\"><s...\n",
       "15  <div><label class=\"inner_link_article_item\"><s...\n",
       "16  <div><label class=\"inner_link_article_item\"><s...\n",
       "17  <div><label class=\"inner_link_article_item\"><s...\n",
       "18  <div><label class=\"inner_link_article_item\"><s...\n",
       "19  <div><label class=\"inner_link_article_item\"><s...\n",
       "20  <div><label class=\"inner_link_article_item\"><s...\n",
       "21  <div><label class=\"inner_link_article_item\"><s...\n",
       "22  <div><label class=\"inner_link_article_item\"><s...\n",
       "23  <div><label class=\"inner_link_article_item\"><s...\n",
       "24  <div><label class=\"inner_link_article_item\"><s...\n",
       "25  <div><label class=\"inner_link_article_item\"><s...\n",
       "26  <div><label class=\"inner_link_article_item\"><s...\n",
       "27  <div><label class=\"inner_link_article_item\"><s...\n",
       "28  <div><label class=\"inner_link_article_item\"><s...\n",
       "29  <div><label class=\"inner_link_article_item\"><s...\n",
       "30  <div><label class=\"inner_link_article_item\"><s...\n",
       "31  <div><label class=\"inner_link_article_item\"><s...\n",
       "32  <div><label class=\"inner_link_article_item\"><s...\n",
       "33  <div><label class=\"inner_link_article_item\"><s...\n",
       "34  <div><label class=\"inner_link_article_item\"><s...\n",
       "35  <div><label class=\"inner_link_article_item\"><s..."
      ]
     },
     "execution_count": 31,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.DataFrame([html_raw]).T\n",
    "df.columns = [\"html_snippets\"]\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Stored 'html_raw' (dict)\n"
     ]
    }
   ],
   "source": [
    "%store html_raw\n",
    "import pickle \n",
    "filehandler = open(\"html_raw\", 'wb') \n",
    "pickle.dump(html_raw, filehandler)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "35\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>html_snippets</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "Empty DataFrame\n",
       "Columns: [html_snippets]\n",
       "Index: []"
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_out = df[~df.duplicated()]\n",
    "print (len(df_out))\n",
    "df[df.duplicated()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[]\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "[]"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "try_again = list(df[df.duplicated()].index)\n",
    "print(try_again)\n",
    "try_again = try_again + list (set(pages).difference(set(df.index.values)))\n",
    "try_again"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [],
   "source": [
    "filename = fn [\"output\"] [\"公众号_htm_snippets\"] \n",
    "df_out.to_csv(filename.format(公众号=公众号), sep=\"\\t\", encoding=\"utf8\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "6,5,6,5,5,5,8,5,5,7,6,6,6,5,5,6,7,7,5,6,5,5,5,5,6,5,6,5,5,5,5,5,5,5,1,"
     ]
    }
   ],
   "source": [
    "def parse_html_snippets(_snippet_):\n",
    "    root = fromstring(_snippet_) \n",
    "    title = [x.text for x in root.xpath('//div[@class=\"inner_link_article_title\"]')]\n",
    "    create_time = [x.text for x in root.xpath('//div[@class=\"inner_link_article_date\"]')]\n",
    "    link = [x for x in root.xpath('//a/@href')]\n",
    "    _df_ = pd.DataFrame({\"title\":title, \"create_time\": create_time, \"link\":link})\n",
    "    return(_df_)\n",
    "    \n",
    "l_df = []\n",
    "for p in pages:\n",
    "    _df_ = parse_html_snippets(df.loc[p,\"html_snippets\"])\n",
    "    print (len(_df_), end=\",\")\n",
    "    l_df.append(_df_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "      <th>create_time</th>\n",
       "      <th>link</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>案例拆解：知群“产品设计入门训练营”拆解</td>\n",
       "      <td>2020-05-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>案例拆解：洋葱学院（原洋葱数学）增长体系拆解</td>\n",
       "      <td>2020-05-15</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>案例拆解：微师学院文言文引流课拆解</td>\n",
       "      <td>2020-05-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>在线教育圈最新335个增长案例拆解.doc</td>\n",
       "      <td>2020-05-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>案例拆解：学而思轻课之免费送好课案例</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09</td>\n",
       "      <td>2020-05-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...</td>\n",
       "      <td>2020-05-10</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>案例拆解：一起学网课0元7节直播课</td>\n",
       "      <td>2020-05-09</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>松月4月总结：走得远的人生，拼的就是复原力</td>\n",
       "      <td>2020-05-08</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>在线教育花钱指南：5步搞定公众号投放，100%提升ROI</td>\n",
       "      <td>2020-05-07</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                title create_time  \\\n",
       "0                                案例拆解：知群“产品设计入门训练营”拆解  2020-05-16   \n",
       "1                              案例拆解：洋葱学院（原洋葱数学）增长体系拆解  2020-05-15   \n",
       "2                                   案例拆解：微师学院文言文引流课拆解  2020-05-14   \n",
       "3                               在线教育圈最新335个增长案例拆解.doc  2020-05-13   \n",
       "4                         狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？  2020-05-12   \n",
       "5                                  案例拆解：学而思轻课之免费送好课案例  2020-05-12   \n",
       "6             从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09  2020-05-11   \n",
       "7   每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...  2020-05-10   \n",
       "8                                   案例拆解：一起学网课0元7节直播课  2020-05-09   \n",
       "9                               松月4月总结：走得远的人生，拼的就是复原力  2020-05-08   \n",
       "10                       在线教育花钱指南：5步搞定公众号投放，100%提升ROI  2020-05-07   \n",
       "\n",
       "                                                 link  \n",
       "0   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "1   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "2   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "3   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "4   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "5   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "6   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "7   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "8   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "9   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "10  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  "
      ]
     },
     "execution_count": 37,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_url_out = pd.concat(l_df).reset_index(drop=True)\n",
    "df_url_out.loc[0:10]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "      <th>create_time</th>\n",
       "      <th>link</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>184</th>\n",
       "      <td>春节红包战全面开打，BAT与今日头条，谁能胜出？</td>\n",
       "      <td>2019-02-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>185</th>\n",
       "      <td>连咖啡裂变指南：1天开店52万家，只因有这4个秘诀</td>\n",
       "      <td>2019-01-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>186</th>\n",
       "      <td>裂变实操：1个模型+4个步骤，教你薅尽微信流量羊毛</td>\n",
       "      <td>2019-01-19</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>187</th>\n",
       "      <td>自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案</td>\n",
       "      <td>2019-01-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>188</th>\n",
       "      <td>一年开2000家门店，luckincoffee有哪些可复用的增长套路？</td>\n",
       "      <td>2019-01-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                   title create_time  \\\n",
       "184             春节红包战全面开打，BAT与今日头条，谁能胜出？  2019-02-02   \n",
       "185            连咖啡裂变指南：1天开店52万家，只因有这4个秘诀  2019-01-28   \n",
       "186            裂变实操：1个模型+4个步骤，教你薅尽微信流量羊毛  2019-01-19   \n",
       "187          自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案  2019-01-17   \n",
       "188  一年开2000家门店，luckincoffee有哪些可复用的增长套路？  2019-01-16   \n",
       "\n",
       "                                                  link  \n",
       "184  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "185  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "186  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "187  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "188  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  "
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_url_out.tail(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "      <th>create_time</th>\n",
       "      <th>link</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>value</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>案例拆解：知群“产品设计入门训练营”拆解</td>\n",
       "      <td>2020-05-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>案例拆解：洋葱学院（原洋葱数学）增长体系拆解</td>\n",
       "      <td>2020-05-15</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>案例拆解：微师学院文言文引流课拆解</td>\n",
       "      <td>2020-05-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>在线教育圈最新335个增长案例拆解.doc</td>\n",
       "      <td>2020-05-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>案例拆解：学而思轻课之免费送好课案例</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09</td>\n",
       "      <td>2020-05-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...</td>\n",
       "      <td>2020-05-10</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>案例拆解：一起学网课0元7节直播课</td>\n",
       "      <td>2020-05-09</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>松月4月总结：走得远的人生，拼的就是复原力</td>\n",
       "      <td>2020-05-08</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>在线教育花钱指南：5步搞定公众号投放，100%提升ROI</td>\n",
       "      <td>2020-05-07</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>案例拆解：跟谁学超级拼读4天训练营</td>\n",
       "      <td>2020-05-06</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>在线教育转化模型、增长黑客工作箱、高薪运营成长图谱……| 星球内参 08</td>\n",
       "      <td>2020-05-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>今晚分享报名：从0到1，训练营的闭环设计</td>\n",
       "      <td>2020-05-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>假期还剩2天，花20分钟读完《金字塔原理》可好？</td>\n",
       "      <td>2020-05-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>案例拆解：跟谁学引流活动系统拆解</td>\n",
       "      <td>2020-05-03</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>案例拆解：作业帮一课3元拼团</td>\n",
       "      <td>2020-05-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>整整 49 篇运营底层逻辑文章，你确定五一还要出门吗</td>\n",
       "      <td>2020-05-01</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>案例拆解：常青藤爸爸英语体验课全流程拆解</td>\n",
       "      <td>2020-04-30</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>10600字梳理训练营SOP服务流程、成交细节、产品搭建</td>\n",
       "      <td>2020-04-29</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>100个各行业案例库、9张增长脑图、新世相10W+幸福课策略……| 星球内参 07</td>\n",
       "      <td>2020-04-27</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>案例拆解：4600字拆解洋葱学院（原洋葱数学）用户成长体系</td>\n",
       "      <td>2020-04-24</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>案例拆解：4400字斑马AI课增长体系拆解</td>\n",
       "      <td>2020-04-21</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>1079个案例库、社群新玩法、流量的精细化运营……| 星球内参 06</td>\n",
       "      <td>2020-04-20</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>案例拆解：宝玩英语社群营销推广员机制</td>\n",
       "      <td>2020-04-18</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>案例拆解：西瓜创客少儿编程0元课拆解</td>\n",
       "      <td>2020-04-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>案例拆解：2600字拆解小步早教公众号增长体系</td>\n",
       "      <td>2020-04-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>在线教育破局指南：跑通3种流量转化模型，100%规模化增长</td>\n",
       "      <td>2020-04-15</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>案例拆解：3000字拆解掌门少儿拉新转化策略</td>\n",
       "      <td>2020-04-15</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>Q1教育圈增长案例合集：这289个案例，值得研究（免费领取）</td>\n",
       "      <td>2020-04-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>156</th>\n",
       "      <td>转化率仅9%的失败引流课复盘，让我懂得6条运营经验</td>\n",
       "      <td>2019-04-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>157</th>\n",
       "      <td>从流量到用户：社区团购如何利用社群做到日流水百万？</td>\n",
       "      <td>2019-04-25</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>158</th>\n",
       "      <td>3种模型+4个步骤，10倍提升裂变式社群转化率的秘籍</td>\n",
       "      <td>2019-04-21</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>159</th>\n",
       "      <td>拉新转化利器！如何做一场裂变10000+用户的直播分享？</td>\n",
       "      <td>2019-04-18</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>160</th>\n",
       "      <td>4大产品设计维度，轻松打造超高口碑的爆款训练营</td>\n",
       "      <td>2019-04-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>161</th>\n",
       "      <td>一张让你轻松制定在线教育用户增长策略的流量运营地图！</td>\n",
       "      <td>2019-04-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>162</th>\n",
       "      <td>想要成为在线教育里的No.1？这有一套最适合你的方法论</td>\n",
       "      <td>2019-04-10</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>163</th>\n",
       "      <td>7大硬核流量玩法揭秘：羊毛党的胜利，独角兽的悲剧</td>\n",
       "      <td>2019-04-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>164</th>\n",
       "      <td>运营人如何摆脱「996」魔咒？可能需要这七个习惯</td>\n",
       "      <td>2019-04-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>165</th>\n",
       "      <td>营销心理学：运营人必须知道的7大用户转化套路</td>\n",
       "      <td>2019-04-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>166</th>\n",
       "      <td>流量池思维的两大核心洞察，教你掌握最低成本获客之道</td>\n",
       "      <td>2019-03-31</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>167</th>\n",
       "      <td>这个让罗永浩害怕和新世相刷屏的营销秘籍，究竟是什么？</td>\n",
       "      <td>2019-03-29</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>169</th>\n",
       "      <td>9元训练营，融资1个亿，扒一扒长投学堂的运营增长套路</td>\n",
       "      <td>2019-03-22</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>170</th>\n",
       "      <td>致运营人：这里有一份价值100万的文案创作指南，请查收</td>\n",
       "      <td>2019-03-20</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>171</th>\n",
       "      <td>这个在线教育“新品种”玩家，如何靠裂变获取百万粉丝？</td>\n",
       "      <td>2019-03-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>172</th>\n",
       "      <td>精准渠道引流4步法，让拉新和转化不再做无用功！</td>\n",
       "      <td>2019-03-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>173</th>\n",
       "      <td>面试与工作必备：运营人必须要懂的9大思考模型</td>\n",
       "      <td>2019-03-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>174</th>\n",
       "      <td>流量高企，增长乏力？快试试这6个低成本的营销套路！</td>\n",
       "      <td>2019-03-08</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>175</th>\n",
       "      <td>1个方法快速升级思维模型，洞破你与运营高手的巨大差距</td>\n",
       "      <td>2019-03-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>176</th>\n",
       "      <td>小程序的4大玩法与4大动因，告诉你如何设计流量裂变体系</td>\n",
       "      <td>2019-03-01</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>177</th>\n",
       "      <td>读书会，新的流量增长点</td>\n",
       "      <td>2019-02-27</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>178</th>\n",
       "      <td>运营人必备的职场逆袭进阶手册</td>\n",
       "      <td>2019-02-24</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>179</th>\n",
       "      <td>K12在线招生指南：提高40%流量转化率的系统运营打法（下）</td>\n",
       "      <td>2019-02-21</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>180</th>\n",
       "      <td>K12在线招生指南：提高40%流量转化率的系统运营打法（上）</td>\n",
       "      <td>2019-02-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>181</th>\n",
       "      <td>我为什么赞成停更「双微一抖」？</td>\n",
       "      <td>2019-02-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>182</th>\n",
       "      <td>运营人成长指南：4大维度告诉你，如何成为新媒体操盘手</td>\n",
       "      <td>2019-02-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>183</th>\n",
       "      <td>由《流浪地球》豆瓣评分引发的关于流量和口碑的思考</td>\n",
       "      <td>2019-02-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>185</th>\n",
       "      <td>连咖啡裂变指南：1天开店52万家，只因有这4个秘诀</td>\n",
       "      <td>2019-01-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>187</th>\n",
       "      <td>自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案</td>\n",
       "      <td>2019-01-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>188</th>\n",
       "      <td>一年开2000家门店，luckincoffee有哪些可复用的增长套路？</td>\n",
       "      <td>2019-01-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>162 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                   title create_time  \\\n",
       "value                                                                  \n",
       "0                                   案例拆解：知群“产品设计入门训练营”拆解  2020-05-16   \n",
       "1                                 案例拆解：洋葱学院（原洋葱数学）增长体系拆解  2020-05-15   \n",
       "2                                      案例拆解：微师学院文言文引流课拆解  2020-05-14   \n",
       "3                                  在线教育圈最新335个增长案例拆解.doc  2020-05-13   \n",
       "4                            狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？  2020-05-12   \n",
       "5                                     案例拆解：学而思轻课之免费送好课案例  2020-05-12   \n",
       "6                从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09  2020-05-11   \n",
       "7      每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...  2020-05-10   \n",
       "8                                      案例拆解：一起学网课0元7节直播课  2020-05-09   \n",
       "9                                  松月4月总结：走得远的人生，拼的就是复原力  2020-05-08   \n",
       "10                          在线教育花钱指南：5步搞定公众号投放，100%提升ROI  2020-05-07   \n",
       "11                                     案例拆解：跟谁学超级拼读4天训练营  2020-05-06   \n",
       "12                  在线教育转化模型、增长黑客工作箱、高薪运营成长图谱……| 星球内参 08  2020-05-05   \n",
       "13                                  今晚分享报名：从0到1，训练营的闭环设计  2020-05-05   \n",
       "14                              假期还剩2天，花20分钟读完《金字塔原理》可好？  2020-05-04   \n",
       "15                                      案例拆解：跟谁学引流活动系统拆解  2020-05-03   \n",
       "16                                        案例拆解：作业帮一课3元拼团  2020-05-02   \n",
       "17                            整整 49 篇运营底层逻辑文章，你确定五一还要出门吗  2020-05-01   \n",
       "18                                  案例拆解：常青藤爸爸英语体验课全流程拆解  2020-04-30   \n",
       "19                          10600字梳理训练营SOP服务流程、成交细节、产品搭建  2020-04-29   \n",
       "21             100个各行业案例库、9张增长脑图、新世相10W+幸福课策略……| 星球内参 07  2020-04-27   \n",
       "24                         案例拆解：4600字拆解洋葱学院（原洋葱数学）用户成长体系  2020-04-24   \n",
       "26                                 案例拆解：4400字斑马AI课增长体系拆解  2020-04-21   \n",
       "27                    1079个案例库、社群新玩法、流量的精细化运营……| 星球内参 06  2020-04-20   \n",
       "29                                    案例拆解：宝玩英语社群营销推广员机制  2020-04-18   \n",
       "30                                    案例拆解：西瓜创客少儿编程0元课拆解  2020-04-17   \n",
       "31                               案例拆解：2600字拆解小步早教公众号增长体系  2020-04-16   \n",
       "32                         在线教育破局指南：跑通3种流量转化模型，100%规模化增长  2020-04-15   \n",
       "33                                案例拆解：3000字拆解掌门少儿拉新转化策略  2020-04-15   \n",
       "34                        Q1教育圈增长案例合集：这289个案例，值得研究（免费领取）  2020-04-14   \n",
       "...                                                  ...         ...   \n",
       "156                            转化率仅9%的失败引流课复盘，让我懂得6条运营经验  2019-04-28   \n",
       "157                            从流量到用户：社区团购如何利用社群做到日流水百万？  2019-04-25   \n",
       "158                           3种模型+4个步骤，10倍提升裂变式社群转化率的秘籍  2019-04-21   \n",
       "159                         拉新转化利器！如何做一场裂变10000+用户的直播分享？  2019-04-18   \n",
       "160                              4大产品设计维度，轻松打造超高口碑的爆款训练营  2019-04-16   \n",
       "161                           一张让你轻松制定在线教育用户增长策略的流量运营地图！  2019-04-14   \n",
       "162                          想要成为在线教育里的No.1？这有一套最适合你的方法论  2019-04-10   \n",
       "163                             7大硬核流量玩法揭秘：羊毛党的胜利，独角兽的悲剧  2019-04-05   \n",
       "164                             运营人如何摆脱「996」魔咒？可能需要这七个习惯  2019-04-04   \n",
       "165                               营销心理学：运营人必须知道的7大用户转化套路  2019-04-02   \n",
       "166                            流量池思维的两大核心洞察，教你掌握最低成本获客之道  2019-03-31   \n",
       "167                           这个让罗永浩害怕和新世相刷屏的营销秘籍，究竟是什么？  2019-03-29   \n",
       "169                           9元训练营，融资1个亿，扒一扒长投学堂的运营增长套路  2019-03-22   \n",
       "170                          致运营人：这里有一份价值100万的文案创作指南，请查收  2019-03-20   \n",
       "171                           这个在线教育“新品种”玩家，如何靠裂变获取百万粉丝？  2019-03-16   \n",
       "172                              精准渠道引流4步法，让拉新和转化不再做无用功！  2019-03-13   \n",
       "173                               面试与工作必备：运营人必须要懂的9大思考模型  2019-03-11   \n",
       "174                            流量高企，增长乏力？快试试这6个低成本的营销套路！  2019-03-08   \n",
       "175                           1个方法快速升级思维模型，洞破你与运营高手的巨大差距  2019-03-04   \n",
       "176                          小程序的4大玩法与4大动因，告诉你如何设计流量裂变体系  2019-03-01   \n",
       "177                                          读书会，新的流量增长点  2019-02-27   \n",
       "178                                       运营人必备的职场逆袭进阶手册  2019-02-24   \n",
       "179                       K12在线招生指南：提高40%流量转化率的系统运营打法（下）  2019-02-21   \n",
       "180                       K12在线招生指南：提高40%流量转化率的系统运营打法（上）  2019-02-17   \n",
       "181                                      我为什么赞成停更「双微一抖」？  2019-02-16   \n",
       "182                           运营人成长指南：4大维度告诉你，如何成为新媒体操盘手  2019-02-13   \n",
       "183                             由《流浪地球》豆瓣评分引发的关于流量和口碑的思考  2019-02-11   \n",
       "185                            连咖啡裂变指南：1天开店52万家，只因有这4个秘诀  2019-01-28   \n",
       "187                          自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案  2019-01-17   \n",
       "188                  一年开2000家门店，luckincoffee有哪些可复用的增长套路？  2019-01-16   \n",
       "\n",
       "                                                    link  \n",
       "value                                                     \n",
       "0      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "1      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "2      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "3      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "4      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "5      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "6      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "7      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "8      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "9      http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "10     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "11     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "12     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "13     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "14     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "15     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "16     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "17     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "18     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "19     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "21     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "24     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "26     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "27     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "29     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "30     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "31     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "32     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "33     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "34     http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "...                                                  ...  \n",
       "156    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "157    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "158    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "159    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "160    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "161    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "162    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "163    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "164    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "165    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "166    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "167    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "169    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "170    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "171    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "172    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "173    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "174    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "175    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "176    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "177    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "178    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "179    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "180    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "181    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "182    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "183    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "185    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "187    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "188    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "\n",
       "[162 rows x 3 columns]"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# tagging 标记\n",
    "tagging_list = [\"\",\"马化腾\", \"腾讯\", \"微众银行\",\"腾讯复星\",\"腾讯风控\",\"腾讯支付\",\"WeChat\",\"We Remit\",\\\n",
    "                \"公益日\",\"红包\",\\\n",
    "                \"腾讯财付通\",\"鹅厂\",\"QQ钱包\",\"QQ红包\",\"QQ\",\\\n",
    "                \"只有一\",\"大咖\",\"听说\",\"图片\",\"照片\",\"小编\",\\\n",
    "                \"洗钱\", \"黑产\",\"被骗\",\"腾讯安全课\",\"诈骗\", \"炒股\",\"神秘兼职\",\"神秘组织\",\\\n",
    "                \"财付通\", \"品牌\",\\\n",
    "                \"收款\",\\\n",
    "                \"报告\",\\\n",
    "                \"银行卡\",\"理财\",\"选股\",\"发票\",\"基金\",\\\n",
    "                \"区块链\",\"金融云\",\"O2O\",\"农产品\",\"家乡\",\\\n",
    "                \"数据\", \"数据赋能\", \"智能\", \"数字孪生\", \"智慧大脑\",\\\n",
    "                \"出行\",\"乘车\",\"公交\",\"乘车码\", \"智慧地铁\",\\\n",
    "                \"高峰论坛\", \"智库\",\\\n",
    "                \"央行\",\"新规\", \\\n",
    "                \"微信\", \"微信支付\", \"跨境支付\", \"移动支付\",\"非银行支付\",\"电子支付\",\\\n",
    "                \"互联网金融\", \"金融科技\",\"互联网＋\",\"互联网+金融\",\"普惠金融\",\"虚拟银行\",\\\n",
    "                \"开放\",\"生态\",\"复杂\",\"互联网思维\",\"全球合作伙伴\",\\\n",
    "                \"联合国\", \"城市\", \"粤港澳大湾区\", \"平台\", \"可持续发展\", \"未来\", \"绿色\",\\\n",
    "                \"医护\",\"防护服\",\"小时\",\"武汉\",\"危机\",\"新冠肺炎\", \"疫\", \"疫情\", \"复工\",\"停课\",\"宅经济\",\\\n",
    "                \"基建\",\"新基建\"] #overwritable\n",
    "\n",
    "v_v_list = []\n",
    "\n",
    "for tag in tagging_list:\n",
    "    index_list = df_url_out [ df_url_out.title.str.contains(tag) ].index.tolist()\n",
    "    v_v_pairs = pd.DataFrame({tag:index_list}).melt().set_index(\"value\")\n",
    "    v_v_list.append(v_v_pairs)\n",
    "\n",
    "df_cat = v_v_list[0]\n",
    "for d in v_v_list:\n",
    "    df_cat.update(d)\n",
    "    \n",
    "# 尚未标记内容\n",
    "df_url_out.loc [ df_cat.query('variable==\"\"').index ]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA==&mid=2247484936&idx=1&sn=1857d02ee66edd7fe2c9f0eb605fb038&chksm=ecb08049dbc7095f9a37c119996c5176f86f7a954ed21fe8a123bbc987f05642578bfdf13d7b#rd'"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_url_out.loc[53].link"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "      <th>create_time</th>\n",
       "      <th>link</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "Empty DataFrame\n",
       "Columns: [title, create_time, link]\n",
       "Index: []"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_url_out[df_url_out.duplicated()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "      <th>create_time</th>\n",
       "      <th>link</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>案例拆解：知群“产品设计入门训练营”拆解</td>\n",
       "      <td>2020-05-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>案例拆解：洋葱学院（原洋葱数学）增长体系拆解</td>\n",
       "      <td>2020-05-15</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>案例拆解：微师学院文言文引流课拆解</td>\n",
       "      <td>2020-05-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>在线教育圈最新335个增长案例拆解.doc</td>\n",
       "      <td>2020-05-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>案例拆解：学而思轻课之免费送好课案例</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09</td>\n",
       "      <td>2020-05-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...</td>\n",
       "      <td>2020-05-10</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>案例拆解：一起学网课0元7节直播课</td>\n",
       "      <td>2020-05-09</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>松月4月总结：走得远的人生，拼的就是复原力</td>\n",
       "      <td>2020-05-08</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>在线教育花钱指南：5步搞定公众号投放，100%提升ROI</td>\n",
       "      <td>2020-05-07</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>案例拆解：跟谁学超级拼读4天训练营</td>\n",
       "      <td>2020-05-06</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>在线教育转化模型、增长黑客工作箱、高薪运营成长图谱……| 星球内参 08</td>\n",
       "      <td>2020-05-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>今晚分享报名：从0到1，训练营的闭环设计</td>\n",
       "      <td>2020-05-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>假期还剩2天，花20分钟读完《金字塔原理》可好？</td>\n",
       "      <td>2020-05-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>案例拆解：跟谁学引流活动系统拆解</td>\n",
       "      <td>2020-05-03</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>案例拆解：作业帮一课3元拼团</td>\n",
       "      <td>2020-05-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>整整 49 篇运营底层逻辑文章，你确定五一还要出门吗</td>\n",
       "      <td>2020-05-01</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>案例拆解：常青藤爸爸英语体验课全流程拆解</td>\n",
       "      <td>2020-04-30</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>10600字梳理训练营SOP服务流程、成交细节、产品搭建</td>\n",
       "      <td>2020-04-29</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>案例拆解：腾讯 ABCmouse 用户增长体系</td>\n",
       "      <td>2020-04-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>100个各行业案例库、9张增长脑图、新世相10W+幸福课策略……| 星球内参 07</td>\n",
       "      <td>2020-04-27</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>任务宝作为微信生态内常用获客工具，有哪些流量模型又有哪些风控设计？\\n\\n野生运营本周分享，...</td>\n",
       "      <td>2020-04-26</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>精彩回顾：教育企业如何用企业微信3.0实现数字化转型</td>\n",
       "      <td>2020-04-25</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>案例拆解：4600字拆解洋葱学院（原洋葱数学）用户成长体系</td>\n",
       "      <td>2020-04-24</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>好未来、新东方、跟谁学等增长运营，平时都看什么书？</td>\n",
       "      <td>2020-04-23</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>案例拆解：4400字斑马AI课增长体系拆解</td>\n",
       "      <td>2020-04-21</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>1079个案例库、社群新玩法、流量的精细化运营……| 星球内参 06</td>\n",
       "      <td>2020-04-20</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>不会玩企业微信，还好意思说自己是做增长的？\\n\\n野生运营本周分享，松月请来了阿泽，专注B端...</td>\n",
       "      <td>2020-04-19</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>案例拆解：宝玩英语社群营销推广员机制</td>\n",
       "      <td>2020-04-18</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>159</th>\n",
       "      <td>拉新转化利器！如何做一场裂变10000+用户的直播分享？</td>\n",
       "      <td>2019-04-18</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>160</th>\n",
       "      <td>4大产品设计维度，轻松打造超高口碑的爆款训练营</td>\n",
       "      <td>2019-04-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>161</th>\n",
       "      <td>一张让你轻松制定在线教育用户增长策略的流量运营地图！</td>\n",
       "      <td>2019-04-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>162</th>\n",
       "      <td>想要成为在线教育里的No.1？这有一套最适合你的方法论</td>\n",
       "      <td>2019-04-10</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>163</th>\n",
       "      <td>7大硬核流量玩法揭秘：羊毛党的胜利，独角兽的悲剧</td>\n",
       "      <td>2019-04-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>164</th>\n",
       "      <td>运营人如何摆脱「996」魔咒？可能需要这七个习惯</td>\n",
       "      <td>2019-04-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>165</th>\n",
       "      <td>营销心理学：运营人必须知道的7大用户转化套路</td>\n",
       "      <td>2019-04-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>166</th>\n",
       "      <td>流量池思维的两大核心洞察，教你掌握最低成本获客之道</td>\n",
       "      <td>2019-03-31</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>167</th>\n",
       "      <td>这个让罗永浩害怕和新世相刷屏的营销秘籍，究竟是什么？</td>\n",
       "      <td>2019-03-29</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>168</th>\n",
       "      <td>深度干货：1个公式拆尽微信裂变玩法，重塑流量池思维</td>\n",
       "      <td>2019-03-25</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>169</th>\n",
       "      <td>9元训练营，融资1个亿，扒一扒长投学堂的运营增长套路</td>\n",
       "      <td>2019-03-22</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>170</th>\n",
       "      <td>致运营人：这里有一份价值100万的文案创作指南，请查收</td>\n",
       "      <td>2019-03-20</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>171</th>\n",
       "      <td>这个在线教育“新品种”玩家，如何靠裂变获取百万粉丝？</td>\n",
       "      <td>2019-03-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>172</th>\n",
       "      <td>精准渠道引流4步法，让拉新和转化不再做无用功！</td>\n",
       "      <td>2019-03-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>173</th>\n",
       "      <td>面试与工作必备：运营人必须要懂的9大思考模型</td>\n",
       "      <td>2019-03-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>174</th>\n",
       "      <td>流量高企，增长乏力？快试试这6个低成本的营销套路！</td>\n",
       "      <td>2019-03-08</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>175</th>\n",
       "      <td>1个方法快速升级思维模型，洞破你与运营高手的巨大差距</td>\n",
       "      <td>2019-03-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>176</th>\n",
       "      <td>小程序的4大玩法与4大动因，告诉你如何设计流量裂变体系</td>\n",
       "      <td>2019-03-01</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>177</th>\n",
       "      <td>读书会，新的流量增长点</td>\n",
       "      <td>2019-02-27</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>178</th>\n",
       "      <td>运营人必备的职场逆袭进阶手册</td>\n",
       "      <td>2019-02-24</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>179</th>\n",
       "      <td>K12在线招生指南：提高40%流量转化率的系统运营打法（下）</td>\n",
       "      <td>2019-02-21</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>180</th>\n",
       "      <td>K12在线招生指南：提高40%流量转化率的系统运营打法（上）</td>\n",
       "      <td>2019-02-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>181</th>\n",
       "      <td>我为什么赞成停更「双微一抖」？</td>\n",
       "      <td>2019-02-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>182</th>\n",
       "      <td>运营人成长指南：4大维度告诉你，如何成为新媒体操盘手</td>\n",
       "      <td>2019-02-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>183</th>\n",
       "      <td>由《流浪地球》豆瓣评分引发的关于流量和口碑的思考</td>\n",
       "      <td>2019-02-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>184</th>\n",
       "      <td>春节红包战全面开打，BAT与今日头条，谁能胜出？</td>\n",
       "      <td>2019-02-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>185</th>\n",
       "      <td>连咖啡裂变指南：1天开店52万家，只因有这4个秘诀</td>\n",
       "      <td>2019-01-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>186</th>\n",
       "      <td>裂变实操：1个模型+4个步骤，教你薅尽微信流量羊毛</td>\n",
       "      <td>2019-01-19</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>187</th>\n",
       "      <td>自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案</td>\n",
       "      <td>2019-01-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>188</th>\n",
       "      <td>一年开2000家门店，luckincoffee有哪些可复用的增长套路？</td>\n",
       "      <td>2019-01-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>189 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 title create_time  \\\n",
       "0                                 案例拆解：知群“产品设计入门训练营”拆解  2020-05-16   \n",
       "1                               案例拆解：洋葱学院（原洋葱数学）增长体系拆解  2020-05-15   \n",
       "2                                    案例拆解：微师学院文言文引流课拆解  2020-05-14   \n",
       "3                                在线教育圈最新335个增长案例拆解.doc  2020-05-13   \n",
       "4                          狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？  2020-05-12   \n",
       "5                                   案例拆解：学而思轻课之免费送好课案例  2020-05-12   \n",
       "6              从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09  2020-05-11   \n",
       "7    每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...  2020-05-10   \n",
       "8                                    案例拆解：一起学网课0元7节直播课  2020-05-09   \n",
       "9                                松月4月总结：走得远的人生，拼的就是复原力  2020-05-08   \n",
       "10                        在线教育花钱指南：5步搞定公众号投放，100%提升ROI  2020-05-07   \n",
       "11                                   案例拆解：跟谁学超级拼读4天训练营  2020-05-06   \n",
       "12                在线教育转化模型、增长黑客工作箱、高薪运营成长图谱……| 星球内参 08  2020-05-05   \n",
       "13                                今晚分享报名：从0到1，训练营的闭环设计  2020-05-05   \n",
       "14                            假期还剩2天，花20分钟读完《金字塔原理》可好？  2020-05-04   \n",
       "15                                    案例拆解：跟谁学引流活动系统拆解  2020-05-03   \n",
       "16                                      案例拆解：作业帮一课3元拼团  2020-05-02   \n",
       "17                          整整 49 篇运营底层逻辑文章，你确定五一还要出门吗  2020-05-01   \n",
       "18                                案例拆解：常青藤爸爸英语体验课全流程拆解  2020-04-30   \n",
       "19                        10600字梳理训练营SOP服务流程、成交细节、产品搭建  2020-04-29   \n",
       "20                             案例拆解：腾讯 ABCmouse 用户增长体系  2020-04-28   \n",
       "21           100个各行业案例库、9张增长脑图、新世相10W+幸福课策略……| 星球内参 07  2020-04-27   \n",
       "22   任务宝作为微信生态内常用获客工具，有哪些流量模型又有哪些风控设计？\\n\\n野生运营本周分享，...  2020-04-26   \n",
       "23                          精彩回顾：教育企业如何用企业微信3.0实现数字化转型  2020-04-25   \n",
       "24                       案例拆解：4600字拆解洋葱学院（原洋葱数学）用户成长体系  2020-04-24   \n",
       "25                           好未来、新东方、跟谁学等增长运营，平时都看什么书？  2020-04-23   \n",
       "26                               案例拆解：4400字斑马AI课增长体系拆解  2020-04-21   \n",
       "27                  1079个案例库、社群新玩法、流量的精细化运营……| 星球内参 06  2020-04-20   \n",
       "28   不会玩企业微信，还好意思说自己是做增长的？\\n\\n野生运营本周分享，松月请来了阿泽，专注B端...  2020-04-19   \n",
       "29                                  案例拆解：宝玩英语社群营销推广员机制  2020-04-18   \n",
       "..                                                 ...         ...   \n",
       "159                       拉新转化利器！如何做一场裂变10000+用户的直播分享？  2019-04-18   \n",
       "160                            4大产品设计维度，轻松打造超高口碑的爆款训练营  2019-04-16   \n",
       "161                         一张让你轻松制定在线教育用户增长策略的流量运营地图！  2019-04-14   \n",
       "162                        想要成为在线教育里的No.1？这有一套最适合你的方法论  2019-04-10   \n",
       "163                           7大硬核流量玩法揭秘：羊毛党的胜利，独角兽的悲剧  2019-04-05   \n",
       "164                           运营人如何摆脱「996」魔咒？可能需要这七个习惯  2019-04-04   \n",
       "165                             营销心理学：运营人必须知道的7大用户转化套路  2019-04-02   \n",
       "166                          流量池思维的两大核心洞察，教你掌握最低成本获客之道  2019-03-31   \n",
       "167                         这个让罗永浩害怕和新世相刷屏的营销秘籍，究竟是什么？  2019-03-29   \n",
       "168                          深度干货：1个公式拆尽微信裂变玩法，重塑流量池思维  2019-03-25   \n",
       "169                         9元训练营，融资1个亿，扒一扒长投学堂的运营增长套路  2019-03-22   \n",
       "170                        致运营人：这里有一份价值100万的文案创作指南，请查收  2019-03-20   \n",
       "171                         这个在线教育“新品种”玩家，如何靠裂变获取百万粉丝？  2019-03-16   \n",
       "172                            精准渠道引流4步法，让拉新和转化不再做无用功！  2019-03-13   \n",
       "173                             面试与工作必备：运营人必须要懂的9大思考模型  2019-03-11   \n",
       "174                          流量高企，增长乏力？快试试这6个低成本的营销套路！  2019-03-08   \n",
       "175                         1个方法快速升级思维模型，洞破你与运营高手的巨大差距  2019-03-04   \n",
       "176                        小程序的4大玩法与4大动因，告诉你如何设计流量裂变体系  2019-03-01   \n",
       "177                                        读书会，新的流量增长点  2019-02-27   \n",
       "178                                     运营人必备的职场逆袭进阶手册  2019-02-24   \n",
       "179                     K12在线招生指南：提高40%流量转化率的系统运营打法（下）  2019-02-21   \n",
       "180                     K12在线招生指南：提高40%流量转化率的系统运营打法（上）  2019-02-17   \n",
       "181                                    我为什么赞成停更「双微一抖」？  2019-02-16   \n",
       "182                         运营人成长指南：4大维度告诉你，如何成为新媒体操盘手  2019-02-13   \n",
       "183                           由《流浪地球》豆瓣评分引发的关于流量和口碑的思考  2019-02-11   \n",
       "184                           春节红包战全面开打，BAT与今日头条，谁能胜出？  2019-02-02   \n",
       "185                          连咖啡裂变指南：1天开店52万家，只因有这4个秘诀  2019-01-28   \n",
       "186                          裂变实操：1个模型+4个步骤，教你薅尽微信流量羊毛  2019-01-19   \n",
       "187                        自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案  2019-01-17   \n",
       "188                一年开2000家门店，luckincoffee有哪些可复用的增长套路？  2019-01-16   \n",
       "\n",
       "                                                  link  \n",
       "0    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "1    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "2    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "3    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "4    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "5    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "6    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "7    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "8    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "9    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "10   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "11   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "12   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "13   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "14   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "15   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "16   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "17   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "18   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "19   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "20   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "21   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "22   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "23   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "24   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "25   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "26   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "27   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "28   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "29   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "..                                                 ...  \n",
       "159  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "160  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "161  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "162  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "163  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "164  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "165  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "166  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "167  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "168  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "169  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "170  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "171  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "172  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "173  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "174  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "175  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "176  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "177  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "178  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "179  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "180  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "181  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "182  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "183  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "184  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "185  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "186  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "187  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "188  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...  \n",
       "\n",
       "[189 rows x 3 columns]"
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_url_out[~df_url_out.duplicated()]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "      <th>create_time</th>\n",
       "      <th>link</th>\n",
       "      <th>variable</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>案例拆解：知群“产品设计入门训练营”拆解</td>\n",
       "      <td>2020-05-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>案例拆解：洋葱学院（原洋葱数学）增长体系拆解</td>\n",
       "      <td>2020-05-15</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>案例拆解：微师学院文言文引流课拆解</td>\n",
       "      <td>2020-05-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>在线教育圈最新335个增长案例拆解.doc</td>\n",
       "      <td>2020-05-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>案例拆解：学而思轻课之免费送好课案例</td>\n",
       "      <td>2020-05-12</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09</td>\n",
       "      <td>2020-05-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...</td>\n",
       "      <td>2020-05-10</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>案例拆解：一起学网课0元7节直播课</td>\n",
       "      <td>2020-05-09</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>松月4月总结：走得远的人生，拼的就是复原力</td>\n",
       "      <td>2020-05-08</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>在线教育花钱指南：5步搞定公众号投放，100%提升ROI</td>\n",
       "      <td>2020-05-07</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>案例拆解：跟谁学超级拼读4天训练营</td>\n",
       "      <td>2020-05-06</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>在线教育转化模型、增长黑客工作箱、高薪运营成长图谱……| 星球内参 08</td>\n",
       "      <td>2020-05-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>今晚分享报名：从0到1，训练营的闭环设计</td>\n",
       "      <td>2020-05-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>假期还剩2天，花20分钟读完《金字塔原理》可好？</td>\n",
       "      <td>2020-05-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>案例拆解：跟谁学引流活动系统拆解</td>\n",
       "      <td>2020-05-03</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>案例拆解：作业帮一课3元拼团</td>\n",
       "      <td>2020-05-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>整整 49 篇运营底层逻辑文章，你确定五一还要出门吗</td>\n",
       "      <td>2020-05-01</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>案例拆解：常青藤爸爸英语体验课全流程拆解</td>\n",
       "      <td>2020-04-30</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>10600字梳理训练营SOP服务流程、成交细节、产品搭建</td>\n",
       "      <td>2020-04-29</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>案例拆解：腾讯 ABCmouse 用户增长体系</td>\n",
       "      <td>2020-04-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>腾讯</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>100个各行业案例库、9张增长脑图、新世相10W+幸福课策略……| 星球内参 07</td>\n",
       "      <td>2020-04-27</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>任务宝作为微信生态内常用获客工具，有哪些流量模型又有哪些风控设计？\\n\\n野生运营本周分享，...</td>\n",
       "      <td>2020-04-26</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>生态</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>精彩回顾：教育企业如何用企业微信3.0实现数字化转型</td>\n",
       "      <td>2020-04-25</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>微信</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>案例拆解：4600字拆解洋葱学院（原洋葱数学）用户成长体系</td>\n",
       "      <td>2020-04-24</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>好未来、新东方、跟谁学等增长运营，平时都看什么书？</td>\n",
       "      <td>2020-04-23</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>未来</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>案例拆解：4400字斑马AI课增长体系拆解</td>\n",
       "      <td>2020-04-21</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>1079个案例库、社群新玩法、流量的精细化运营……| 星球内参 06</td>\n",
       "      <td>2020-04-20</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>不会玩企业微信，还好意思说自己是做增长的？\\n\\n野生运营本周分享，松月请来了阿泽，专注B端...</td>\n",
       "      <td>2020-04-19</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>微信</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>案例拆解：宝玩英语社群营销推广员机制</td>\n",
       "      <td>2020-04-18</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>159</th>\n",
       "      <td>拉新转化利器！如何做一场裂变10000+用户的直播分享？</td>\n",
       "      <td>2019-04-18</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>160</th>\n",
       "      <td>4大产品设计维度，轻松打造超高口碑的爆款训练营</td>\n",
       "      <td>2019-04-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>161</th>\n",
       "      <td>一张让你轻松制定在线教育用户增长策略的流量运营地图！</td>\n",
       "      <td>2019-04-14</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>162</th>\n",
       "      <td>想要成为在线教育里的No.1？这有一套最适合你的方法论</td>\n",
       "      <td>2019-04-10</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>163</th>\n",
       "      <td>7大硬核流量玩法揭秘：羊毛党的胜利，独角兽的悲剧</td>\n",
       "      <td>2019-04-05</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>164</th>\n",
       "      <td>运营人如何摆脱「996」魔咒？可能需要这七个习惯</td>\n",
       "      <td>2019-04-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>165</th>\n",
       "      <td>营销心理学：运营人必须知道的7大用户转化套路</td>\n",
       "      <td>2019-04-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>166</th>\n",
       "      <td>流量池思维的两大核心洞察，教你掌握最低成本获客之道</td>\n",
       "      <td>2019-03-31</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>167</th>\n",
       "      <td>这个让罗永浩害怕和新世相刷屏的营销秘籍，究竟是什么？</td>\n",
       "      <td>2019-03-29</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>168</th>\n",
       "      <td>深度干货：1个公式拆尽微信裂变玩法，重塑流量池思维</td>\n",
       "      <td>2019-03-25</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>微信</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>169</th>\n",
       "      <td>9元训练营，融资1个亿，扒一扒长投学堂的运营增长套路</td>\n",
       "      <td>2019-03-22</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>170</th>\n",
       "      <td>致运营人：这里有一份价值100万的文案创作指南，请查收</td>\n",
       "      <td>2019-03-20</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>171</th>\n",
       "      <td>这个在线教育“新品种”玩家，如何靠裂变获取百万粉丝？</td>\n",
       "      <td>2019-03-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>172</th>\n",
       "      <td>精准渠道引流4步法，让拉新和转化不再做无用功！</td>\n",
       "      <td>2019-03-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>173</th>\n",
       "      <td>面试与工作必备：运营人必须要懂的9大思考模型</td>\n",
       "      <td>2019-03-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>174</th>\n",
       "      <td>流量高企，增长乏力？快试试这6个低成本的营销套路！</td>\n",
       "      <td>2019-03-08</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>175</th>\n",
       "      <td>1个方法快速升级思维模型，洞破你与运营高手的巨大差距</td>\n",
       "      <td>2019-03-04</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>176</th>\n",
       "      <td>小程序的4大玩法与4大动因，告诉你如何设计流量裂变体系</td>\n",
       "      <td>2019-03-01</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>177</th>\n",
       "      <td>读书会，新的流量增长点</td>\n",
       "      <td>2019-02-27</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>178</th>\n",
       "      <td>运营人必备的职场逆袭进阶手册</td>\n",
       "      <td>2019-02-24</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>179</th>\n",
       "      <td>K12在线招生指南：提高40%流量转化率的系统运营打法（下）</td>\n",
       "      <td>2019-02-21</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>180</th>\n",
       "      <td>K12在线招生指南：提高40%流量转化率的系统运营打法（上）</td>\n",
       "      <td>2019-02-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>181</th>\n",
       "      <td>我为什么赞成停更「双微一抖」？</td>\n",
       "      <td>2019-02-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>182</th>\n",
       "      <td>运营人成长指南：4大维度告诉你，如何成为新媒体操盘手</td>\n",
       "      <td>2019-02-13</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>183</th>\n",
       "      <td>由《流浪地球》豆瓣评分引发的关于流量和口碑的思考</td>\n",
       "      <td>2019-02-11</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>184</th>\n",
       "      <td>春节红包战全面开打，BAT与今日头条，谁能胜出？</td>\n",
       "      <td>2019-02-02</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>红包</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>185</th>\n",
       "      <td>连咖啡裂变指南：1天开店52万家，只因有这4个秘诀</td>\n",
       "      <td>2019-01-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>186</th>\n",
       "      <td>裂变实操：1个模型+4个步骤，教你薅尽微信流量羊毛</td>\n",
       "      <td>2019-01-19</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>微信</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>187</th>\n",
       "      <td>自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案</td>\n",
       "      <td>2019-01-17</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>188</th>\n",
       "      <td>一年开2000家门店，luckincoffee有哪些可复用的增长套路？</td>\n",
       "      <td>2019-01-16</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>无法分类</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>189 rows × 4 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 title create_time  \\\n",
       "0                                 案例拆解：知群“产品设计入门训练营”拆解  2020-05-16   \n",
       "1                               案例拆解：洋葱学院（原洋葱数学）增长体系拆解  2020-05-15   \n",
       "2                                    案例拆解：微师学院文言文引流课拆解  2020-05-14   \n",
       "3                                在线教育圈最新335个增长案例拆解.doc  2020-05-13   \n",
       "4                          狂薅1000万粉丝背后，在线教育抖音卖课的路子有多野？  2020-05-12   \n",
       "5                                   案例拆解：学而思轻课之免费送好课案例  2020-05-12   \n",
       "6              从0到1训练营主题分享、猿辅导49元课拆解、活动诱饵设计……| 星球内参 09  2020-05-11   \n",
       "7    每周日的集体学习来啦！如何通过集中式的高强度学习，实现个人运营能力的跃迁？\\n\\n野生运营本...  2020-05-10   \n",
       "8                                    案例拆解：一起学网课0元7节直播课  2020-05-09   \n",
       "9                                松月4月总结：走得远的人生，拼的就是复原力  2020-05-08   \n",
       "10                        在线教育花钱指南：5步搞定公众号投放，100%提升ROI  2020-05-07   \n",
       "11                                   案例拆解：跟谁学超级拼读4天训练营  2020-05-06   \n",
       "12                在线教育转化模型、增长黑客工作箱、高薪运营成长图谱……| 星球内参 08  2020-05-05   \n",
       "13                                今晚分享报名：从0到1，训练营的闭环设计  2020-05-05   \n",
       "14                            假期还剩2天，花20分钟读完《金字塔原理》可好？  2020-05-04   \n",
       "15                                    案例拆解：跟谁学引流活动系统拆解  2020-05-03   \n",
       "16                                      案例拆解：作业帮一课3元拼团  2020-05-02   \n",
       "17                          整整 49 篇运营底层逻辑文章，你确定五一还要出门吗  2020-05-01   \n",
       "18                                案例拆解：常青藤爸爸英语体验课全流程拆解  2020-04-30   \n",
       "19                        10600字梳理训练营SOP服务流程、成交细节、产品搭建  2020-04-29   \n",
       "20                             案例拆解：腾讯 ABCmouse 用户增长体系  2020-04-28   \n",
       "21           100个各行业案例库、9张增长脑图、新世相10W+幸福课策略……| 星球内参 07  2020-04-27   \n",
       "22   任务宝作为微信生态内常用获客工具，有哪些流量模型又有哪些风控设计？\\n\\n野生运营本周分享，...  2020-04-26   \n",
       "23                          精彩回顾：教育企业如何用企业微信3.0实现数字化转型  2020-04-25   \n",
       "24                       案例拆解：4600字拆解洋葱学院（原洋葱数学）用户成长体系  2020-04-24   \n",
       "25                           好未来、新东方、跟谁学等增长运营，平时都看什么书？  2020-04-23   \n",
       "26                               案例拆解：4400字斑马AI课增长体系拆解  2020-04-21   \n",
       "27                  1079个案例库、社群新玩法、流量的精细化运营……| 星球内参 06  2020-04-20   \n",
       "28   不会玩企业微信，还好意思说自己是做增长的？\\n\\n野生运营本周分享，松月请来了阿泽，专注B端...  2020-04-19   \n",
       "29                                  案例拆解：宝玩英语社群营销推广员机制  2020-04-18   \n",
       "..                                                 ...         ...   \n",
       "159                       拉新转化利器！如何做一场裂变10000+用户的直播分享？  2019-04-18   \n",
       "160                            4大产品设计维度，轻松打造超高口碑的爆款训练营  2019-04-16   \n",
       "161                         一张让你轻松制定在线教育用户增长策略的流量运营地图！  2019-04-14   \n",
       "162                        想要成为在线教育里的No.1？这有一套最适合你的方法论  2019-04-10   \n",
       "163                           7大硬核流量玩法揭秘：羊毛党的胜利，独角兽的悲剧  2019-04-05   \n",
       "164                           运营人如何摆脱「996」魔咒？可能需要这七个习惯  2019-04-04   \n",
       "165                             营销心理学：运营人必须知道的7大用户转化套路  2019-04-02   \n",
       "166                          流量池思维的两大核心洞察，教你掌握最低成本获客之道  2019-03-31   \n",
       "167                         这个让罗永浩害怕和新世相刷屏的营销秘籍，究竟是什么？  2019-03-29   \n",
       "168                          深度干货：1个公式拆尽微信裂变玩法，重塑流量池思维  2019-03-25   \n",
       "169                         9元训练营，融资1个亿，扒一扒长投学堂的运营增长套路  2019-03-22   \n",
       "170                        致运营人：这里有一份价值100万的文案创作指南，请查收  2019-03-20   \n",
       "171                         这个在线教育“新品种”玩家，如何靠裂变获取百万粉丝？  2019-03-16   \n",
       "172                            精准渠道引流4步法，让拉新和转化不再做无用功！  2019-03-13   \n",
       "173                             面试与工作必备：运营人必须要懂的9大思考模型  2019-03-11   \n",
       "174                          流量高企，增长乏力？快试试这6个低成本的营销套路！  2019-03-08   \n",
       "175                         1个方法快速升级思维模型，洞破你与运营高手的巨大差距  2019-03-04   \n",
       "176                        小程序的4大玩法与4大动因，告诉你如何设计流量裂变体系  2019-03-01   \n",
       "177                                        读书会，新的流量增长点  2019-02-27   \n",
       "178                                     运营人必备的职场逆袭进阶手册  2019-02-24   \n",
       "179                     K12在线招生指南：提高40%流量转化率的系统运营打法（下）  2019-02-21   \n",
       "180                     K12在线招生指南：提高40%流量转化率的系统运营打法（上）  2019-02-17   \n",
       "181                                    我为什么赞成停更「双微一抖」？  2019-02-16   \n",
       "182                         运营人成长指南：4大维度告诉你，如何成为新媒体操盘手  2019-02-13   \n",
       "183                           由《流浪地球》豆瓣评分引发的关于流量和口碑的思考  2019-02-11   \n",
       "184                           春节红包战全面开打，BAT与今日头条，谁能胜出？  2019-02-02   \n",
       "185                          连咖啡裂变指南：1天开店52万家，只因有这4个秘诀  2019-01-28   \n",
       "186                          裂变实操：1个模型+4个步骤，教你薅尽微信流量羊毛  2019-01-19   \n",
       "187                        自媒体赚钱吗？看完这篇今日头条运营指南，你就能知道答案  2019-01-17   \n",
       "188                一年开2000家门店，luckincoffee有哪些可复用的增长套路？  2019-01-16   \n",
       "\n",
       "                                                  link variable  \n",
       "0    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "1    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "2    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "3    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "4    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "5    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "6    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "7    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "8    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "9    http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "10   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "11   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "12   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "13   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "14   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "15   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "16   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "17   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "18   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "19   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "20   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       腾讯  \n",
       "21   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "22   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       生态  \n",
       "23   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       微信  \n",
       "24   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "25   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       未来  \n",
       "26   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "27   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "28   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       微信  \n",
       "29   http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "..                                                 ...      ...  \n",
       "159  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "160  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "161  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "162  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "163  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "164  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "165  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "166  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "167  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "168  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       微信  \n",
       "169  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "170  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "171  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "172  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "173  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "174  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "175  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "176  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "177  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "178  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "179  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "180  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "181  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "182  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "183  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "184  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       红包  \n",
       "185  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "186  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       微信  \n",
       "187  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "188  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...     无法分类  \n",
       "\n",
       "[189 rows x 4 columns]"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_o = df_url_out.join(df_cat).replace(\"\", np.nan).fillna(\"无法分类\")\n",
    "df_o"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "      <th>create_time</th>\n",
       "      <th>link</th>\n",
       "      <th>variable</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>案例拆解：腾讯 ABCmouse 用户增长体系</td>\n",
       "      <td>2020-04-28</td>\n",
       "      <td>http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...</td>\n",
       "      <td>腾讯</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                      title create_time  \\\n",
       "20  案例拆解：腾讯 ABCmouse 用户增长体系  2020-04-28   \n",
       "\n",
       "                                                 link variable  \n",
       "20  http://mp.weixin.qq.com/s?__biz=MzI5NzY1MzAzOA...       腾讯  "
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_o[df_o.title.str.contains(\"腾讯\")]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>title</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>variable</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>无法分类</th>\n",
       "      <td>162</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>微信</th>\n",
       "      <td>12</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>生态</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>小时</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>平台</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>未来</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>疫情</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>红包</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>腾讯</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "          title\n",
       "variable       \n",
       "无法分类        162\n",
       "微信           12\n",
       "生态            6\n",
       "小时            2\n",
       "平台            2\n",
       "未来            2\n",
       "疫情            1\n",
       "红包            1\n",
       "腾讯            1"
      ]
     },
     "execution_count": 45,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_stats = df_o.groupby(by=\"variable\").agg({\"title\":\"count\"}).sort_values(by=\"title\", ascending=False)\n",
    "df_stats"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_account.columns.name = \"rel_accounts\"\n",
    "df_o.columns.name = \"url_cat\"\n",
    "df_stats.columns.name = \"stats\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [],
   "source": [
    "_df_.columns.name"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Get the xlsxwriter workbook and worksheet objects.  \n",
    "with pd.ExcelWriter(fn[\"output\"][\"公众号_xlsx\"].format(公众号=公众号)) as writer:\n",
    "    workbook  = writer.book\n",
    "\n",
    "    for _df_ in [df_account, df_o, df_stats]:\n",
    "        _df_.to_excel(writer, sheet_name = _df_.columns.name)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
